# -*- coding: utf-8 -*-
from datetime import timedelta

from jms.dwd.dwd_warhouse.dwd_wide_summary_waybill_incre import jms_dwd__dwd_wide_summary_waybill_incre
from utils.operators.cluster_for_spark_sql_operator import SparkSqlOperator

jms_dwd__dwd_wide_unsign_summary_waybill_dt = SparkSqlOperator(
    task_id='jms_dwd__dwd_wide_unsign_summary_waybill_dt',
    task_concurrency=1,
    pool_slots=10,
    master='yarn',
    name='jms_dwd__dwd_wide_unsign_summary_waybill_dt_{{ execution_date | date_add(1) | cst_ds }}',
    sql='jms/dwd/dwd_warhouse/dwd_wide_unsign_summary_waybill_dt/execute.sql',
    driver_memory='38G',
    driver_cores=4,
    retries=1,
    email=['rongguangfan@jtexpress.com','yl_bigdata@yl-scm.com'],
    executor_cores=5,
    executor_memory='20G',
    num_executors=120,  # spark.dynamicAllocation.enabled 为 True 时，num_executors 表示最少 Executor 数
    conf={'spark.dynamicAllocation.enabled': 'true',  # 动态资源开启
          'spark.shuffle.service.enabled': 'true',  # 动态资源 Shuffle 服务开启
          'spark.dynamicAllocation.maxExecutors': 130,  # 动态资源最大扩容 Executor 数
          'spark.dynamicAllocation.cachedExecutorIdleTimeout': 180,  # 动态资源自动释放闲置 Executor 的超时时间(s)
          'spark.sql.sources.partitionOverwriteMode': 'dynamic',  # 允许删改已存在的分区
          'spark.executor.memoryOverhead': '6G',  # 堆外内存
          'spark.sql.shuffle.partitions': 4500,
          'spark.default.paralleism': 4500,
          'spark.hadoop.hive.exec.dynamic.partition.mode': 'true',
          'spark.reducer.maxSizeInFlight': '96M',
          'spark.shuffle.file.buffer': '64k',
          'spark.shuffle.io.retryWait':'20',
          'spark.shuffle.memoryFraction': '0.8',
          'spark.executor.extraJavaOptions': '-XX:+UseG1GC -XX:ParallelGCThreads=5'
          },
    # hiveconf={'hive.exec.dynamic.partition': 'true',  # 动态分区
    #           'hive.exec.dynamic.partition.mode': 'nonstrict',
    #           'hive.exec.max.dynamic.partitions': 1800,  # 每天生成 60 个分区
    #           'hive.exec.max.dynamic.partitions.pernode': 180,  # 每天生成 60 个分区
    #           },
    yarn_queue='warehouse',
    #execution_timeout=timedelta(hours=2)
    #excel平均时长:13分0秒
    execution_timeout = timedelta(minutes=90),
)

jms_dwd__dwd_wide_unsign_summary_waybill_dt << [
    jms_dwd__dwd_wide_summary_waybill_incre]
